APPENDIX A - 24/8 Update Method 

if (pref ix__length <= 24) { 

prefix_diff = 24 - pref ix__length; 

prefix = ip__addr » (32 - pref ix_length) ; 

for (ui = 0; ui < (1 << prefix_diff } ; ui++) { 

// compute index into first level table T1_RIB 
tl_index - (prefix << prefix_diff) + ui; 
result [15 : 0] = T1_RIB [tl_index] ; 

if ( result [15] == 1'bO) { 

// the first bit in T1_RIB is 0 

old_pref ix_length = result [5:0]; 

if (old_j>ref ix_length <~ pref ix_length) { 

// update with new next hop and prefix length 

T1_RIB [tl_index] = (next_hop <<6 +pref ix_length) 
St 0x7FFF; 

} 

} 

else { // the first bit is 1 

for (uj = 0; uj < 256; uj++} { 

t2_index = result [14: 6] <<8 +u j ; 
t2_result [15 :0] = T2_RIB [t2_index] ; 

if (t2_result [5:0] <= pref ix_length) { 

// assign next next hop and prefix length 
T2_RIB[t2_index] = (next_hop « 6) + pref ix__length; 
} 

} // end of FOR loop 
} // end of ELSE loop 
} // end of FOR loop 
} // end of IF loop 

else { // i.e., pref ix_length > 24 

offset_size - 32 - pref ix_length; 
prefix_diff = pref ix_length - 24; 
tl_index = ip_addr [31 : 8] ; 
tl_result [15:0] = T1_RIB [tl_index] ; 

// find the end bit position in the ip address and compute offset 
offset = ip_addr [7 :of f set_size] ; 
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if (tl_result [15] =- l'bO) { // the first bit is 0 in T1_RIB 
index = get_index{); // get a new index into T2JRIB 
// compute the begin & end address of the segment in T2_RIB 
segment_begin_addr = {index « 8) + offset; 
segment_end_addr = (index <<8) + offset + 
(1 << of f set__size) - 1; 

// update T1_RIB with the next index and mark 1st bit to 1 
T1_RIB [tl_index] = {index « 6) | 0x8000; 

for (uj = 0; uj < 256; uj++) { 

t2_index = (index << 8) + uj ; 

if { {t2_index >= segment_begin_addr) && 
{t2_index < = segment_end_addr) ) { 
// this is the segment needs to be updated 
// with new NH and prefix length information. 
T2_RIB [t2_index] = (next_hop << 6)+prefix length; 

} 

else { // update unmatching segment with old NH & PL 
T2_RIB [t2_index] = tl_result [15:0] ; 

} 

} // end of FOR loop 
} // end of IF loop 
else { // the first bit in T1_RIB is 1 
index = tl_result [14 : 6] ; 

// compute the begin & end address of the segment in T2JRIB 
segment_begin_addr = {index << 8) + offset; 
segment_end_addr = {index <<8) + offset + 
(1 << offset_size) - 1; 

for (uj = 0; uj < 256; uj++) { 

t2_index = (index << 8) + u j ; 
if ( (t2_index >= segment_begin_addr) && 
(t2_index <= segment_end_addr) ) { 
// this is the segment matching the prefix 
old_j)ref ix__length = T2_RIB [t2_index] & 0xO03F; 
if (oldj>ref ix__length pref ix_length) { 
// need to update wit new NH and PL 
T2_RIB [t2_index] = (next_hop<<6) +pref ix length; 

} 

} // end of IF loop 
} // end of FOR loop 
} // end of ELSE loop 
} // end of ELSE loop 
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APPENDIX B - Pseudo Code of 24/8c Route Lookup Method 



// get segment and offsets from IP address 
segment [17 : 0] = ip_addr [31 : 14] ; 
offsetl[5:0] = ip_addr [13 : 8] ; 
offset2[7:0] = ip_addr [7:0] ; 

tl_result [95:0] = T1_RIB [segment] ; 

/ / compute the number of ones in the bit map 

all_ones = compute_num_ones_in_bitmap (tl__result [95:0] ) ; 
K = 95 - offsetl [5:0] ; 

leading_ones = compute_num_ones__in_bitmap (tl_result [95 :K] ) 

if (all_ones <= 2) { 
if (leading_ones == 1) 
nhpl[15:0] = tl_result [31:16] ; 
else 

nhpl[15:0] = tl_result [15 : 0] ; 
} 

else { // the total number of one's is more than 2 
address = tl_result [31 : 0] ; 

current_address = address + leading_ones - 1; 

/ / retrieve nhpl value stored in the address 
nhpl[15:0] = *current_address ; 

} 

if ( (nhpl [15] == l'bO) { // first bit in NHPL is 0 
next_hop = nhpl [14 : 6] ; 

} 

else { // first bit in NHPL is 1 
index__t2 = nhpl [14:0]; 
t2_index = index_t2 << 8 + offset2; 
t2_result [15 : 0] = T2_RIB [t2_index] ; 
next_hop = t2_result [15 : 6] ; 

} 
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APPENDIX C Pseudo Code of 24/8c Route Update Method 



segment = ( (ip_addr) >>14) ; // get the first 18 significant bits 
new_nhpl = (next_hop<<6) + pref ix_length; // compute new NHPL 

if (pref ix_length <= 18) { 

//NO need to change the bitmap 

// only need to update NHPL array as needed 

pl_diff = 18 - pref ix_JLength; 

tl_base = ( segment > >pl_dif f) <<pl_diff; 

for (ti = 0; ti < (l«pl_diff ) ; ti++) { 
tl__index - tl_base + ti; 
tl_result = &(Tl_RIB[tl_index] ) ; 

bmp = tl_result->bmp; // bmp stores 64 bitmap tl_entry [95 : 32] ; 
all_ones = count_leading_ones (bmp, 63); 

for (i = 1; i <= all_ones; i++) { 

// walk thr ought the NHPL array and make changes as needed 

// get the old nhpl 

// i indicates the leading ones 

nhpl = get_current_nhpl (tl__result , all_ones, i) ; 

if ( (nhpl & 0x8000) ==0) { // marker bit is 0 
old_pl = (nhpl & 0x003F) ; 

if ( (oldjpl <= pref ix_length) && (nhpl 1= new_nhpl) ) { 
// update T1_RIB with new nhpl 

replace_current_nhpl (tl_result, all_ones, i, new_nhpl) ; 

} 

} 

else { // marker bit is 1 

t2_index = ( (nhpl & 0x7FFF) << 8) ; // times 256 
begin_index = t2_index; 
end_index = t2_index + 255; 

update_t2_rib (begin_index, end_index, pref ix_length, next_hop) ; 

} 

} // end of for (i = 1; i <= all_ones; ...) 
} // end of for (ti = 0; ...) 
} // end of if (pref ix_length <= 18) 

else if (pref ix__length <= 24) { // 18 < pref ix__length <= 24 

/ / get the next 6 bits after the significant 18 bits as of f setl 
offsetl - ( (ip_addr<<18) »26) ; // 6 bits 
pl_diff = 24 - pref ix_length; 

tl_result = &<T1_RIB [segment] ) ; 

tl_bmp_base = ( (offsetl >> pl_dif f ) << pl_dif f ) ; 

for (ti = 0; ti < (1 << pl_dif f ) ; ti++) { 

pos = tl_bmp_base + ti; // get the bit position 

/ / count the number of all ones and leading ones 
bmp = tl_result->bmp; 

all_ones = count_leading_ones (bmp, 63); 



TEN-008 2-8.D0C 



46 



leading_ones = count_leading_ones (bmp, pos); 
// get the old prefix info 

nhpl = get_current_nhpl (tl_result , all_ones, leading_ones) ; 

if ( ( (nhpl & 0x8000) == 0) && (nhpl i= new_nhpl) ) { 
// the marker bit is 0 and new nhpl is NOT equal to the old nhpl 
// in this case, we may need to change bitmap and nhpls 
oldjpl = (nhpl & 0x003F) ; 
if (old_pl <= pref ix_length) { 

// update with new nhpl and update bitmap 

cb = ((bmp << pos) » 63); // get current bit 

if (pos == 0) { // this is the first bit 
// get the next bit 
nb = ( (bmp << (pos + 1) ) >> 63) ; 

if (nb ==0) { // change the bitmap "10x" --> 
tl_result->bmp |= OXC00OO0O0OO0O0OO0LL; 
// since pos 0, leading_ones has to be 1 
insert_bef ore_pos_nhpl ( tl_result , all_ones , 

} 

else { // nb == 1 

next_nhpl = get_next__nhpl ( tl_result , all__ones , leading_ones) 
if ( next_nhpl — new_nhpl) { 

// change the bitmap "llx" --> "lOx" , set next bit to 0 

bits_mask = (1LL<< (62 -pos) ) ; 

tl_result- >bmp &= -bits_mask; 

delete_current__nhpl (tl_result , all_ones, leading_ones) ; 

} 

else { //no need to change the bitmap "llx" 

rep 1 ace_current_nhpl (tl_re suit , all__ones, 1, new_nhpl) ; 

} 

} 

} // end of if (pos == 0) 

else if (pos 63) { // end bit 
if (cb — 0) { // current bit is 0 

// change bit map from "x0" --> "xl" 

tl_result->bmp = (tl_result->bmp | OxOOOOOOOOOOOOOOOILL) ; 

insert_afterjpos_nhpl (tljresult, all_ones 7 leading_ones , 
new__nhpl) ; 

} 

else { // cb =- 1 

// get previous nhpl 

prev_nhpl = get_prev_nhpl ( tl_result , all_ones , leading_ones) 

if (new_nhpl == prev_nhpl) { //PC-->P 
// change bit map from "xl" "xO" 

tljresult ->bmp = { tl_result->bmp & OxFFFFFFFFFFFFFFFELL) 
delete_current_nhpl (tl_result , al^ones, leading_ones) ; 

} 



"llx" 

1, new_nhpl) ; 
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else { // new_nhpl i= prev_nhpl, PC-- > P N 
//no need to change bitmap 

replace_current_nhpl (tl_jresult, all_ones, leading_ones , 
new_nhpl) ; 

} 



} // end of if (pos == 63) 

else { // this is a middle bit 
// get the next bit 
nb = ( (bmp << (pos +!))>> 63); 



if ( (cb =- 0) && (nb == 0) ) { // bmp: "xOOx" 
// change bitmap "xOOx" --> "xllx" 
// 0...0110..0 where the first 1 starts at pos 
bits_mask = ( (1LL<< (63-pos) ) | (1LL<< (62-pos) ) ); 
tl_result->bmp |= bits_mask; 

insert_af ter_jpos_dup_nhpl (tl_result, all_ones, 
leading_ones, new_nhpl) ; 
} // end of (cb == 0, nb == 0) 

else if ( (cb == 0) && (nb == 1) ) { // bmp: "xOlx" 
// get next nhpl 

next_nhpl = get_next_nhpl (tl_result , all_ones , leading_ones) ; 

if (next_nhpl 1= new_nhpl) { // F 1= N 
// change bitmap "xOlx" --> "xllx" 

bits_mask = ( (1LL<< (63-pos) ) | (1LL<< (62-pos) ) ); 
tl_result->bmp |= bits_mask; 

insert_af ter_jpos_nhpl {tl_result, all__ones / 
leading_ones, new_nhpl) ; 

} 

else { // F == N 

// change bitmap "xOlx" --> "xlOx" 
bits_mask = (1LL<< (63-pos) ) ; 
// set pos bit to 1 
tl_result->bmp |= bits_mask; 
// set the next bit to 0 
bits_mask = (1LL<< (62-pos) ) ; 
tl_result->bmp &= -bits__mask; 



//NO need to change NHPL array 
} 

} 



else if ( (cb == 1) && (nb == 0) ) { // bmp: "xlOx" 

prev_nhpl = get_prev__nhpl (tl_re suit, all_ones, lead ing_ones) ; 

if (prev_nhpl != new__nhpl) { // P != N 
// change bit map "xlOx" --> "xllx" 

bits_mask = ( (1LL<< (63-pos) ) | (1LL<< (62-pos) ) ); 
tl_result->bmp |= bits_mask; 
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insert_bef ore_pos_nhpl ( t l_resul t , all_ones , 
leading_ones , new_nhpl) ; 

} 

else { // P == N 

// change bit map "xlOx" --> "xOlx" 
// set pos bit to 0 
bits_mask = (1LL<< (63 -pos) ) ; 
tl__result->bmp &= (-bitsjnask) ; 
// set the next bit to 1 
bits_mask = (1LL<< (62-pos) ) / 
tl__result->bmp |= bits_mask; 

//NO need to change NHPL array 

} 

} 

else if ( (cb == 1) && (nb == 1) ) { // bmp: "xllx" 

next__nhpl = get_next__nhpl (tl_result, all_ones, leading_ones) 
prev_nhpl = get_prev_nhpl (tl_result, all_ones , leading_ones) 

if (next_nhpl == new_nhpl) {//PCF-->PF 
// change the bitmap "xllx" --> "xlOx" 
// set the next bit to 0 
bits_mask = (1LL<< (62-pos) ) ; 
tl_result->bmp &= ~bits_mask; 



delete__current_nhpl (tl_result, all_ones, leading_ones) ; 

} 

else if (prev_nhpl new_nhpl) {//PCF-->PF 
// change the bitmap "xllx" --> M x01x M 
// set the current bit to 0 
bits_mask = (1LL<< (63-pos) ) ; 
tl_result->bmp &= ~bits_mask; 



delete_current_nhpl (tl_result, all_on.es, leading_ones) ; 

} 

else { // P C F --> P N F 

//no need to change the bitmap "xllx" 
replace_current_nhpl (tl_result , all_ones , 
leading_ones, new_nhpl) ; 

} 

} // end of if ( (cb == 1) && (nb == 1)) 
} // End of else this is a middle bit 
} // end of if (old_pl <= pref ix_length) 

} // end of if ( ( (nhpl & 0x8000) == 0) (nhpl != newjohpl) ) 

else if ( (nhpl & 0x8000) != 0) { // the marker bit is 1 
// NO need to change bitmap pattern 
// only need to update T2_RIB 
index = (nhpl & 0x7 FFF) ; 
t2_index = (index « 8) ; 
begin_index = t2_index; 
end_index = t2_index + 255; 

update_t2_rib (begin_index, end_index, pref ix_length, next_hop) 
} // end of if ( (nhpl & 0x8000) !- 0) 
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} // end of for (ti = 0; ti < (l«pl_diff ) ; ...) 
} // end of if (pref ix_length <= 24) 

else { // pref ix_length > 24 
off setl = ( (ip__addr<<18) >>26) ; 
pl_diff = pref ix_length - 24; 

// get the significant bits after the first 24 significant bits 
offset_temp =( (ip_addr<<24) >> (32 - pl_diff) ); 
offset_t2 =( of fset_temp « (32 - pref ix_length) ); 
segment_size = (1 << (32 - pref ix_length) ) ; 

tl_result = &(T1_RIB [segment] ) ; 

bmp = t l_r e suit- >bmp ; 
pos = off setl; 

// count the number of all ones and leading ones 
all__ones = count_leading_ones (bmp, 63); 
leading_ones = count_leading_ones (bmp, pos) ; 

// get the old prefix info 

nhpl ~ get_current_nhpl (tl_result, all_ones, leading_ones) ; 

if ( (nhpl & 0x8000) == 0) { // the marker bit is 0 
//DO need to change bitmap 

t2_index = get_t2__index ( ) ; 

begin_index = (t2_index << 8) ; 

end__index = begin_index + 255; 

cb = ((bmp << pos) >> 63); // get current bit 

// marker the first bit to 1 
tl_new_nhpl = (t2_index | 0x8 000) ; 

if (pos != 63) { // this is NOT the end bit 
// get current bit and next bit 
nb = ( (bmp << (pos +1) ) >> 63) ; 

// for all cases, we need to change bitmap to "xx" -- >"11" 
bits_mask = ( (1LL<< (63 -pos) ) | (1LL<< (62-pos) ) ); 
tl_result->bmp | = bits_mask; 

if ( (cb == 0) (nb == 0) ) { // bitmap: "OOx" -- > "llx" 
insert_af ter_pos_dup_nhpl (tl_result, all_ones, 
leading_ones, tl_new_nhpl) ; 

} 

else if ( (cb == 0) (nb ==!)){ // bitmap: "OOx" -- > "llx" 
insert_after_pos_nhpl (tl_result, all_ones, 
leading_ones, tl_new_nhpl) ; 

} 

else if ( (cb == 1) (nb == 0) ) { // bitmap: "OOx" > "llx" 

insert_before_pos_nhpl (tl_result, all_ones, 
leading_ones, tl_new_nhpl) ; 

} 
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else if ( (cb == 1) && (nb == 1) ) { // bitmap : "0 Ox" -- > "llx 
replace_current_nhpl ( tl_result , all_ones , 
leading_on.es, tl_new_nhpl) ; 

} 

} // end of if (pos 1= 63) 

else { // end bit 

if (cb 0) { // change bitmap: "xO" --> "xl" 
// change bit map from "xO" --> "xl" 
tl_result->bmp |= OxOOOOOOOOOOOOOOOILL; 

insert_af ter_pos_nhpl (tl_result , all_ones 7 leading_ones, 
tl_new_nhpl) ; 

} 

else { // cb == 1 

/ / no need to change bitmap 
replace_current_nhpl (tl_result, all_ones, 
leading__ones, tl__new_nhpl) ; 

} 

} 

// update T2_RIB with old nhpl for those nonmatching segment 
// update T2_RIB with new nhpl for those matching segment 
begin_segment_index = begin_index + of f set_t2 ; 
end_segment_index = begin_segment_index + segment_size - 1; 
f irst_update_t2_rib (begin_index, end_index, begin_segment__index, 
end_segment_index, nhpl, new_nhpl) ; 

} 

else { // the marker bit is 1 
// no need to change bitmap 
t2_index = (nhpl & 0x7 FFF) ; 

begin_index = (t2_index << 8) + offset_t2; 
end_index = begin_index + segment_size - 1; 



update_t2_rib (begin_index, end_index, pref ix_length, next_hop) ; 
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APPENDIX D. Extended Xtensa Instructions with TIE 

state o_lookupl 96 

// field nhopl o_lookupl [31 : 16] 

// field nhop2 o__lookupl [15 : 0] 

// field nhopaddr = o_lookupl [31 : 0] 

state leading_ones 32 

// state all__ones 32 



interface 


VAddr 


32 


core 


out 


interface 


LSSize 


5 


core 


out 


interface 


MemDataInl28 


128 


core 


in 


interface 


MemDataInl6 


16 


core 


in 



opcode LOAD128 op2 = 0 CUSTO 

opcode ALLONES op2=l CUSTO 

opcode GETNHOPADDRFROMT1 op2=2 CUSTO 

opcode INDEXFORT2 op2=3 CUSTO 

opcode GETNHOPFROMT2 op2=4 CUSTO 

opcode LEADONES op2 = 5 CUSTO 

opcode GETNHOPADDRFROMADDR op2=6 CUSTO 

iclass loadl {LOAD128} {out arr f in ars, in art} {out o_lookupl} { 
out VAddr, out LSSize, in MemDataInl28 

} 

// 

// 128 bit load from memory. MemDataInl28 [127 : 64] has the bit map 
// MemDataInl28 [63 : 32] stores either two next hops (each of which is 
// is a 16 bit data or a 32 bit address pointing to a list of 
// next hops. 
// 

reference LOAD128 { 

assign LSSize = 5'blOOOO; 

assign VAddr = ars + art; 

assign arr - MemDataInl28 [63 : 32] ; 

assign o_lookupl = {MemDataInl28 [127 : 32] } ; 

} 

// 

// loads from memory is a 2 cycle operation 
// 

schedule SI {LOAD128} {def o_lookupl 2; def arr 2;} 
iclass compl {ALLONES } {out arr} {in o_lookupl} { 

} 

// Count occurence of all ones in the 64 bit bitmap array 
// 

// Method is 32 1-bit adders at the first level 



// 16 2 -bit adders at the second level 

// 8 3 -bit adders at the third level 

// 4 4 -bit adders at the fourth level 

II 2 5 -bit adders at the fifth level 

// 1 6 -bit adder at the sixth level 
// 



// Reason for parallelism is to speed up performance of 
// addition. Hardware implementation for multi-bit adders 
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// is implemted as ripple carry adders. 

//In order to understand the number of stages in this 

// implemetation 

// 6 XOR stages at the RTL level. 
// 15 CARRY STAGES (1+2+3+4+5) 
// Totaling 21 stage design 

reference ALLONES { 

// first level description 
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wO 
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wire 
wire 



/ / second ] 


.evel 


wire [2 : 0] 


wl_0 
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wl_l 
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wl_2 
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wl_3 







2:0 
2:0 



wl_4 ; 
wl 5; 
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wire [2 


0] 
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wire [2 
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wl 
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// third level description 
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// fourth level description 
wire [4:0] w3_0; 
wire [4:0] w3_l; 
wire [4:0] w3_2 ; 
wire [4:0] w3 3; 



// fifth level description 
wire [5:0] w4_0; 
wire [5:0] w4_l; 

w0_0 = o_lookupl [95] +o_lookupl [94] ; 
w0_l = o_lookupl [93] +o_lookupl [92] ; 
w0_2 = o_lookupl [91] +o_lookupl [90] ; 
w0_3 = o_lookupl [89] +o_lookupl [88] ; 



assign 
assign 
assign 
assign 



assign w0_4 - o_lookupl [87] +o_lookupl [86] ; 

assign w0_5 = o__lookupl [85] +o_lookupl [84] ; 

assign w0_6 = o_lookupl [83] +o_lookupl [82] ; 

assign w0_7 = o_lookupl [81] +o_lookupl [80] ; 
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assign 


w0_ 


_10 




o_ 


_lookupl [75] +o_ 


JLookupl [74] 


assign 


w0_ 


JL1 




o_ 


JLookupl [73] +o_ 


]lookupl [72] 


assign 


w0_ 


_12 




o_ 


_lookupl [71] +o_ 


JLookupl [70] 


assign 


w0_ 


_13 




o 


_lookupl [69] +o_ 


_lookupl [68] 


assign 


w0_ 


_14 




o_ 


lookupl [67] +o_ 


lookupl [66] 


assign 


w0_ 


_15 




o_ 


_lookupl [65] +o_ 


lookupl [64] 


assign 


w0_ 


JL6 




o_ 


JLookupl [63] +o_ 


JLookupl [62] 


assign 


wO 


_17 




o 


^lookupl [61] +o_ 


lookupl [60] 


assign 


wO 


_18 




o_ 


lookupl [59] +o_ 


JLookupl [58] 


assign 


w0_ 


_ 19 




o_ 


_lookupl [57] +o_ 


JLookupl [56] 
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assign w0_20 = o_lookupl [55] +o_lookupl [54] 

assign w0_21 = o_lookupl [53] +o_lookupl [52] 

assign w0_22 = o_lookupl [51] +o_lookupl [50] 

assign w0_23 = o_lookupl [49] +o_lookupl [4 8] 

assign w0_24 - o__lookupl [47] +o_lookupl [46] 

assign w0_25 - o_lookupl [45] +o__lookupl [44] 

assign w0_26 = o_lookupl [43] +o_lookupl [42] 

assign w0_27 = o_lookupl [41] +o_lookupl [40] 

assign w0_28 = o_lookupl [39] +o_lookupl [38] 

assign w0_29 = o_JLookupl [37] +o_lookupl [36] 

assign w0_30 = o_lookupl [35] +o_lookupl [34] 

assign w0_31 = o_lookupl [33] +o_lookupl [32] 

// second level description 



assign 


wl_ 


_0 = 


w0_0+w0_l; 


assign 


wl_ 


_1 = 


w0_2+w0__3 ; 


assign 


wl_ 


_2 = 


w0_4+w0__5 ; 


assign 


wl_ 


[3 = 


w0_6+w0_7; 


assign 


wl_ 


_4 = 


wO 8+w0_9 ; 


assign 


wl_ 


~5 = 


W0_10+w0_ll; 


assign 


wl_ 


_6 = 


w0_12+w0_13 ; 


assign 


wl_ 


1 = 


w0_14+w0_15; 


assign 


wl_ 


_8 = 


wO 16+w0_17; 


assign 


wl_ 


_9 = 


w0_18+w0__19; 


assign 


wl_ 


10 


= W0_20+W0_21; 


assign 


wl_ 


11 


= w0_22+w0_23; 


assign 


wl_ 


12 


= wO_24+wO_25 / 


assign 


wl_ 


JL3 


= w0_26+w0_27; 


assign 


wl_ 


"l4 


= w0__28+w0_29; 


assign 


wl_ 


15 


= wO 30+wO 31; 


// third 


level description 



assign w2_0 = wl_0+wl_l 

assign w2_l = wl_2+wl_3 

ass ign w2__2 = wl_4 +wl_5 

assign w2_3 = wl_6+wl_7 



assign w2_4 = wl_8+wl_9; 

assign w2_5 = wl_10+wl_ll 

assign w2__6 = wl_12+wl_13 

assign w2__7 = wl_14+wl_15 

// fourth level description 



assign w3__0 

assign w3_l 

assign w3_2 

assign w3_3 



= w2_0+w2_l 
= w2_2+w2_3 
= w2_4+w2_5 
= w2 6+w2 7 



// fifth level description 
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assign w4_0 = w3_0+w3_l; 
assign w4_l = w3_2+w3_3 ; 

// sixth level description 

assign arr = w4_0+w4_l; 

// assign all_ones - w4_0+w4__l; 

} 

iclass compl__l {LEADONES} {out arr, in ars} {in o__lookupl, out leading_ones} { 
} 

// Method : 
// 

// Step 1 : result_tmp = o_lookupl>> (63 -Value (ars) ) 

// Step 2 : result = count_ones (result_tmp) 

// 

// First step is implemented as o_lookupl>>~ars [6 : 0] 
// 

// Count occurence of all ones in the 64 bit bitmap array 
// Method is 32 1-bit adders at the first level 



// 16 2 -bit adders at the second level 

// 8 3 -bit adders at the third level 

// 4 4 -bit adders at the fourth level 

// 2 5 -bit adders at the fifth level 

// 1 6 -bit adder at the sixth level 
// 



// Reason for parallelism is to speed up performance of 
// addition. Hardware implementation for multi-bit adders 
// is implemted as ripple carry adders. 
// In order to understand the number of stages in this 
// implemetation 

// 6 XOR stages at the RTL level. 
// 15 CARRY STAGES (1+2+3+4+5) 
// Totaling 21 stage design 
reference LEADONES { 



wire [1 : 


0] 


spw0_ 


_°< 




wire [1 : 


0] 


spw0_ 


_1 , 




wire [1 : 


0] 


spw0_ 


_2 ; 




wire [1 . 


0] 


spw0_ 


3, 




wire [1 


0] 


spw0_ 


_4, 




wire [1 


0] 


spw0_ 






wire [1 


o] 


spw0_ 






wire [1 


0] 


spw0_ 


_7 , 




wire [1 


0] 


spw0_ 






wire [1 


0] 


spw0_ 


9; 


wire [1 


0] 


spw0_ 


10; 


wire [1 


0] 


spw0_ 




wire [1 


0] 


spw0_ 


JL2; 


wire [1 


0] 


spw0_ 


13; 


wire [1 


0] 


spw0_ 


14; 


wire [1 


0] 


spw0_ 




wire [1 


0] 


spw0_ 


16; 


wire [1 


0] 


spw0_ 
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wire [1 : 


0] 


spw0_ 


18; 


wire [1 : 


0] 


spw0_ 


_19; 


wire [1 : 


0] 


spw0_ 


20; 


wire [1 : 


0] 


spw0_ 


21; 


wire [1 : 


o] 


spwO 


22 ; 


wire [1 : 


o] 


spwO_ 


23; 


wire [1 : 


0] 


spwO_ 


_24; 


wire [1 : 


0] 


spwO_ 


25; 


wire [1 : 


0] 


spwO_ 


26; 


wire [1 : 


0] 


spw0_ 


21 ; 


wire [1 : 


0] 


spwO_ 


28; 


wire [1 : 


0] 


spw0_ 


29; 


wire [1 : 


0] 


spwO_ 


30; 


wire [1 : 


0] 


spwO_ 


_31; 



// second level description 





wire [2 


:0] 


spwl_0 , 






wire [2 


:0] 


spwl_l , 






wire [2 


:0] 


spwl_2 , 






wire [2 


:0] 


spwl_3 , 






wire [2 


:0] 


spwl_4 , 






wire [2 


:0] 


SPW1_5 ; 






wire [2 


:0] 


spwl_6 , 






wire [2 


:0] 


spwl__7 j 






wire [2 


:0] 


spwl_8 ; 




wire [2 


:0] 


spwl_9 ; 




wire [2 


:0] 


spwl_10 ; 




wire [2 


:0] 


spwl 11; 




wire [2 


:0] 


spwl__12 ; 




wire [2 


:0] 


spwl_13; 




wire [2 


:0] 


spwl__14 ; 




wire [2 


:0] 


spwl_15 ; 




wire [3 


:0] 


spw2_0 






wire [3 


:0] 


spw2__l 






wire [3 


:0] 


spw2__2 






wire [3 


:0] 


spw2_3 






wire [3 


:0] 


spw2_4 






wire [3 


:0] 


spw2_5 






wire [3 


:0] 


spw2_6 






wire [3 


:0] 


spw2_7 





// fourth level description 

wire [4:0] spw3_0; 

wire [4:0] spw3_l; 

wire [4 : 0] spw3__2 ; 

wire [4:0] spw3_3; 

// fifth level description 
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wi r e [ 5 : 0 ] spw4_0 ; 
wire [5:0] spw4_l ; 



wire [6:0] result; 



wire [95 : 0] lookupl_sp; 



assign lookupl_sp = (o__lookupl>> (~ars [5:0])); 

assign spw0_0 = lookupl__sp [95] +lookupl_sp [94] ; 

assign spw0_l = lookup l_sp [93] -(-lookup l_sp [92] ; 

assign spw0_2 = lookup l__sp [91] + lookup l_sp [90] ; 

assign spw0_3 = lookup l_sp [89] +lookupl_sp [88] ; 

assign spw0_4 = lookup l_sp [87] +lookupl_sp [86] ; 

assign spw0_5 = lookup l_sp [85] +lookupl_sp [84] ; 

assign spw0_6 = lookupl_sp [83] +lookupl_sp [82] ; 

assign spw0_7 = lookupl_sp [81] +lookupl_sp [80] ; 

assign spw0__8 = lookupl_sp [79] +lookupl_sp [78] 

assign spw0_9 = lookup l_sp [77] +lookupl_sp [76] 

assign spw0_10 = lookup l_sp [75] +lookupl_sp [74] 

assign spw0_ll = lookupl_sp [73] +lookupl_sp [72] 



assign 


spw0_ 


_12 




lookup 1 


sp [71] +lookupl_ 


_sp[70] ; 


assign 


spw0_ 


JL3 




lookup 1_ 


_sp [69] +lookupl_ 


sp[68] ; 


assign 


spw0_ 


JL4 




lookup 1_ 


_sp [67] +lookupl_ 


"sp [66] ; 


assign 


spw0_ 


_15 




lookup 1_ 


_sp [65] +lookupl_ 


_sp[64] ; 


assign 


spw0_ 


16 




lookupl_ 


_sp [63] +lookupl_ 


J3p[62] ; 


assign 


spw0_ 


_17 




lookup 1_ 


sp [61] + lookup 1_ 


~sp[60] ; 


assign 


spw0_ 


18 




lookup 1_ 


_sp [59] + lookup 1_ 


~sp[58] ; 


assign 


spw0_ 


"l 9 




lookup 1_ 


_sp [57] +lookupl_ 


_sp[56] ; 


assign 


spw0_ 


20 




lookup 1_ 


sp [55] + lookup 1_ 


„sp[54] ; 


assign 


spw0_ 


_21 




lookup 1_ 


_sp [53] + lookup 1_ 


sp[52] ; 


assign 


spw0_ 


22 




lookup 1_ 


_sp [51] +lookupl_ 


sp[50] ; 


assign 


spw0_ 


23 




lookup 1_ 


_sp [49] +lookupl_ 


sp[48] ; 


assign 


spw0_ 


_24 




lookup 1_ 


sp [47] +lookupl_sp [46] ; 


assign 


spwO 


2 5 




lookup 1 


sp [45] +lookupl_ 


_sp [44] ; 


assign 


spw0_ 


_26 




lookup 1_ 


_sp [43] +lookupl_ 


_sp[42] ; 


assign 


spw0_ 


21 




lookup 1_ 


_sp [41] + lookup 1_ 


_sp[40] ; 


assign 


spw0_ 


_28 




lookup 1_ 


_sp [39] +lookupl_ 


_sp[38] ; 


assign 


spw0_ 


_29 




lookup 1_ 


_sp [37] +lookupl_ 


_sp[36] ; 


assign 


spw0_ 


_3 0 




lookup 1_ 


_sp [35] +lookupl_ 


sp[34] ; 


assign 


spw0_ 


_31 




lookup 1_ 


_sp [33] +lookupl_ 


sp[32] ; 



// second level description 



assign 


spwl_ 


0 


= spw0_ 


_0+spw0_l ; 


assign 


spwl_ 


"l 


= spwO_ 


_2+spw0_3; 


assign 


spwl_ 


~2 


= spw0_ 


_4+spw0__5 ; 


assign 


spwl_ 


~3 


= spw0_ 


_6+spw0_7; 


assign 


spwl_ 


_4 


= spw0_ 


_8 + spw0_9; 


assign 


spwl_ 


5 


= spw0_ 


_10+spw0_ll; 


assign 


spwl_ 


6 


= spw0_ 


_12+spw0_13; 
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assicrn 


spwl 


7 = 


spwO 14+spwO 15; 


assign 


spwl_ 


_8 = 


spw0_16+spw0_17 ; 


assign 


spwl_ 


~9 = 


Spw0_18+spw0_19 ; 


assign 


spwl_ 


_10 - 


= spw0_20+spw0_21; 


assign 


spwl_ 


~11 


= spwO 22+spw0_23; 


assign 


spwl^ 


J- 2 


= spw0_24+spw0_25 ; 


assign 


spwl_ 


~13 


= spw0_26+spw0_27; 


assign 


spwl_ 


~14 


= spw0_28+spw0_29; 


assign 


spwl_ 


_15 


= spwO 30+spw0_31; 


// third 


level 


description 


assign 


spw2_ 


_0 = 


spwl_0+spwl__l ; 


assign 


spw2_ 


_1 = 


spwl_2+spwl_3 ; 


assign 


spw2_ 


_2 = 


spwl_4 +spwl_5 ; 


assign 


spw2_ 


_3 = 


spwl_6+spwl_7 ; 


assign 


spw2_ 


_4 = 


spwl_8+spwl_9 ; 


assign 


spw2_ 


_5 = 


spwl_JLO+spwl_ll ; 


assign 


spw2_ 


6 = 


spwl_12+spwl__13 ; 


assign 


spw2_ 


1 = 


spwl 14+spwl_15; 



// fourth level description 



assign spw3_0 - spw2_0+spw2_l ; 

assign spw3_l - spw2_2+spw2_3 ; 

assign spw3_2 = spw2_4+spw2_5 ; 

assign spw3_3 = spw2_6+spw2_7 ; 

// fifth level description 

assign spw4_0 = spw3_0+spw3_l; 
assign spw4_l = spw3_2+spw3_3 ; 

// sixth level description 

assign leading_ones = spw4_0+spw4_l; 

assign result = {spw4_0+spw4_l-l} ; 

assign arr = {result [6 : 0] , 1 1 bO } ; // 2* (leading_ones-l) 

// 2* (leading_ones-l) gives the 
// result used by GETNHOPADDR 

// schedule S2 {ALLONES} {def all_ones 1; def arr 1;} 
schedule S2 {ALLONES} {def arr 1;} 

schedule S2L {LEADONES} {def leading_ones 1; def arr 1;} 

iclass comp2 { GETNHOPADDRFROMT1 } {out arr} {in leading_ones, in o_lookupl} {} 
// 

// If leading_ones == 1 then return o_lookupl [31 : 16] otherwise 
// return o__lookupl [15 : 0] 

// 

reference GETNHOPADDRFROMTl { 

assign arr = (leading_ones == 1) ? o_lookupl [31 : 16] : o_lookupl [15 : 0] ; 

} 
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schedule S3 { GETNH0PADDRFR0MT1 } {def arr 1;} 



iclass comp2_l {GETNHOPADDRFROMADDR} {in ars, in art, out arr} {} { 
out VAddr, out LSSize, in MemDataInl6 

} 

// 

// 16bit load to get nhop from a list 

// ars is the 32 bit base address stored in o_lookupl [63 : 32] 
// art is the 16 bit offset from the base address which is 
// computed as 2* (leading_ones - 1) 
reference GETNHOPADDRFROMADDR { 

assign LSSize = 5 T b00010; 

assign VAddr = ars [31:0] + art [15:0]; 

assign arr = MemDataInl6 ; 

} 

// 
// 

schedule S3_l { GETNHOPADDRFROMADDR } {def arr 2;} 
// 

iclass load2_sh { GETNHOPFROMT2 } {out arr, in ars, in art} {} { 
out VAddr, out LSSize, in MemDataInl6 

} 

// 

// 16 bit load to get nhop from T2_RIB 
// ars is the base address & (T2__RIB [0] ) 

// art is the offset which is computed from INDEXFORT2 
// 

reference GETNHOPFROMT2 { 
assign LSSize = 5'bOOOlO; 
assign VAddr = ars [31:0] + art [15:0]; 
assign arr = {6 'bO ,MemDataInl6 [15:6] } ; 

} 

// 
// 

schedule S4_S {GETNHOPFROMT2 } {def arr 2;} 

iclass index { INDEXFORT2 } {out arr, in ars, in art} {} { 
} 

// 

// Table2 Index = 2* (nhop [14 : 0] *256) + & (T2_RIB [0] ) 
// 

reference INDEXF0RT2 { 

assign arr = { { {ars [7 : 0] , 8 • b0}+art [15 : 0] }<<l} ; 

} 

// 

schedule S6 { INDEXFORT2 } {def arr 1;} 
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APPENDIX E A Sample of C Code for Route Lookup with New Extended Instructions 

static unsigned int rt_lookup_tie (unsigned int ip_addr) { 
// get the most significant 18 bits from IP address 
// and appended with 4 zeros since in TIE data is arranged by 
// byte while in T1_RIB by 128 bits, 
unsigned int offset = ( (ip_addr>>14) <<4) ; 
unsigned short int tloffset; 
unsigned int nhpladdr, all_ones; 
unsigned int bytepos_leading_ones, nhpl; 

static Tl_Entry *tl_base = & (T1_RIB [0] ) ; // get T1_RIB base address 
static unsigned short *t2_base = & (T2_RIB [0] ) ; // T2_RIB base address 

nhpladdr - L0AD128 (tl_base, offset) ; // load the 128 bit from T1_RIB 
tloffset = ( (ip_addr«18) »26) ; // get the middle 6 bits in ip_addr 
all_ones = ALLONES () ; 

bytepos_leading_ones = LEADONES (tloffset) ; 

if (all_ones <= 2) 

nhpl = GETNHOPADDRPROMT1 (); 
else 

nhpl = GETNHOPADDRFROMADDR (bytepos_leading_ones , nhpladdr) ; 

if ( (nhpl >>15) == 0) { // get the marker bit 
return nhpl>>6; 

} 

else { 

unsigned short int t2offset = ( (ip_addr<<24) »24) ; 

unsigned int t 2 segment _n_of f set = INDEXFORT2 (nhpl , t2off set) ; 

return GETNHO P FROMT 2 (t2_base, t2segment__n_of f set) ; 

} 

} 
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APPENDIX F Cycle Count of Route Lookup Function 



00750000 : 


40057504 : 


<rt lookup_tie> : 






00750000 : 


40057504 : 


6cl004 


entry 


al, 


32 


00250000 : 


40057507 : 


d520 


mov.n 


a5, 


a2 


00255313 : 


40057509 : 


14fd22 


132r 


a4, 


40056994 


00250000 : 


4005750c : 


05e314 


srli 


a3 f 


a5, 14 


00258399 : 


4005750f : 


244200 


132i 


a4 f 


a4, 0 


00250000 : 


40057512 : 


0C3311 


slli 


a3, 


a3, 4 


01043576 : 


40057515 : 


034660 


loadl28 


a6 , 


a4, a3 


00500000 : 


40057518 : 


000461 


allones 


a4 




00250000 : 


4005751b : 


058345 


extui 


a3, 


a5, 8, 6 


00250007 


4005751e : 


003265 


leadones a2 


f a3 


00250000 


40057521 : 


6f4305 


bgeui 


a4, 


3,4005752c 


00187163 


40057524 


000462 


getnhopaddrf romtl a4 


00187163 


40057527 


600002 


j 


4005752d 


00471684 


4005752a 


062466 


getnhopaddrfromaddr a: 


00687163 


: 4005752d 


: 04f314 


srli 


a3, 


a4, 15 


00250006 


: 40057530 


: CC34 


bnez.n 


a3 , 


40057538 


00249821 


: 40057532 


: 046214 


srli 


a2, 


a4, 6 


00249821 


: 40057535 


: 060000 


retw 






00000537 


: 40057538 


: 13fdl8 


132r 


a3, 


40056998 


00000179 


: 4005753b 


: 050247 


extui 


a2, 


a5, 0, 8 


00000179 


: 4005753e 


: 8330 


132i.n 


a3. 


a3, 0 


00000185 


: 40057540 


: 024263 


indexfort2 


a2 , a4 , 


00001115 


: 40057543 


: 023264 


getnhopf romt2 a2, a3 


00000179 


: 40057546 


: dlOf 


retw.n 







total cycles in block »rt_lookup_tie" : 6592490 
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